! CM " CSCT ^ CSA ^ c ^CTCTCTTeCCTATeSATTeACAAACeCAAACTTCTeATCGA 

TXACAAGTCArrCAAACACaXCAAMTCTC-ATCCCTATMCACAATAm^CAAAT " 

1 21 !"!!f^"!^ TT ! T ^^^^C^AACTTGA^CC^AAT^C? 1 

TATCTCATGTTTCTACAATTAAAAAAATTGTTTTTTTTTCCA^^AA^CCAACA^T 1 



120 
30 



241 ^:^^^*f^^^ I ^C^TAAACACGCCTTKCmCTTm 

AATATTCTATTACAOOTT^TTCTCCC^ilTC^ ^ 



3S1 + 

42 



- + + + ^ + 



1 I ^!f^^^f^ TCACTMCT ^GA«SAAAGGATAAAC«ArrcrrGATATTTCA ' 

— — — f _ ^ ^QQ 

CTG7TTTAC7CATTCCCTTT7TAAATAAGAAC7ATArGCCGATTTGCCCATATATTTTTC 

541 ni A ii A ff^ c if AcAT ~ cTGTAcAATs " TcTArc 540 

GAAAAtTCGAATTTATTTTTCTCTACTTTTTACTCGTTGCATTCGlcATclKATA^ 
601 *™"~™*~~™~+»~*™— — i 

CCGCTCTATTtATATTCAACGAtTTTTATAAATTACTACTCCTTCATGT^^TTTCATT " 
6 SI ~ —— -~— _ — ^^.^.^^ . r _ ^ _ _ _ _ _ 

721 rilllVJ^l^ KC1 ^ X7 ^^ 

+ + ^ + ^ ^ ^ 



78 1 I~If I!!*"! A ^ TTCAACGTATTTT ' rATCC CTCACAATTTATCCACATTTCCCGCTT 

GGAGAITTATCCTCXATATTACArGCCTGTTTTTTTAAAGGATATAATGTTTMCAAATA 
841 ————^^ » ^. t . 



901 A " TTTTATCAATCCTATTGTATATTCTCCAKTAACCG TTGTTTCGAAAACATCACCTA 

CCATTTTAAAAtTCACAAAATCTTGCTTCCTTATAATCAAGAAGATTTTTCAGATGCTCT 

♦ + + 1Q20 

* M L C 

102 ^ _^ TCCMTGCCCCCC ^ TGAGCACCCCACACACCACGC 

.eiecralstIht TTTTTTT'p 1080 

T nll€2 

1081 C ^ CTCA ff CATTCACTTA ^ TAG ^^^AAAAACATrrTCACAGAAGATCATTCTCAAC 

*DALT*LECXNIFTE TTTTl 114 ° 

30 40 

TTATCAGTAAAATGTCAACTCGCC7CGAGAGGAT,CCCCAATTT7CTTCGAATCTATCGAC 
1141 + ^ — — + k 

XSXMSTRLERIANFL iTT~~iT~R 1200 
50 60 
1 2 o i f 3! AAGC ll^ 7C:AACrrC:GACCACTCATCG ACTTTT7CAAC "ACAACAATC AAAG7CACC 

QASELCPLIDFFNYNNQ ~h""l 
70 80 
12 6 1 ' «GCTGA?TTCCTCGAAGAC7ACATCGATTTTGCGAXAAATGACCCAGATC?ACTTCCTC 

AD FLEDTIDFAINE? D**!""? 

90 100 



^ CA CTAG T CATTGCTCCACAATTT7CCCC ACAAA7CCTCGAT AGGAAAC7 ATTGCTTGGGA 

VVlA? QrSRQHLDRX l"T"l"~n 
"° 120 



1330 



FIGURE 1 



T n22 74 

atcttccaaaacaaatgacatcctxtattcgagagtatcacctccxtIcactcatcaaaa 

1381 ♦ + + + * + 1440 

VPKQMTCriRE^HVDRVIKX 
130 140 

ilncron 1 
TCAGAAAACTCCAACCTCTCCTGTTTATTATAATC 

LDEMCOLO 
I ISO 

T7GC77AAAC77CA»C7CC777777C7G777C7ACACGGCCGACC7GGATCCGGAAAA7 

SFFLFLHGRACSC.XS 

ISO 

ilntron 2 
7GAC7GG7AT 

1551 + + + + + , 1S20 

VIASQALSKSDQLIGI 
170 1 ISO 
TATCTGAATCTACCGATCTTCATTCTAXTACACSAAATTATGAT7CAATCGTTTGGCTCAA 
1521 * * + 1 + + 1S3 0 

NtDSIVWLK 
190 

AGATAGTGGAACAGCTCCAAAATCTACATTCGATTTATTTACGGATATTTTGCTGATCCT 
1581 * + + + + + 1740 

D5G7APKS7FD LF7DILLML 

200 210 

A nl920/n224 7 



JIntron 1 
7GAG7GAA7ACAG7CCA7G7AACA77CACCA7GA7777C 



"CAAA77A7GAAAA777GA 

1741 ♦ + * + + + 1800 

K 

CC7GG77ACC7777AA777CA7A777CC7GACGC77GCA7G7777C7G7G777CAAGACG 
1801 + + + h + I860 

ACCCCG7C77C7GAGCGACACGGATGAC7CGCA77CGA7CACCGAC77CA77AACCC7C7 

1351 + + + ♦ <► + 1920 

A. n2273 

7C777CAAdAAGCGAAGACGA7C77C7CAA777CCCA7CCC7GGAGCA7G7CACGICAG7 

SEDDLLHFP SVEHV7SV 
220 

ilfltron 4 
7AAC77GC77GCCGA77C7CG7ACAA7A7C77AAA77AT7CGT 

1931 + + + + * + 204 0 

V L X R .M 
230 I 

7777AcK7C7GCAACGCAC7CA77CA7CG7CCAAA7AC777A77CG7A777GA7GACG7A 

ICNALIDRP NT LFVFDDV 
240 250 
A nl948 7 nl947 

\ \ 

G77CAAGAACAAACAAT7CG77GGGC7CACCACC7ACG7C77CGA7G7CT7C7AAC7AC7 

VQEE7IRWAQELRLRCLV77 

260 270 
CG7GACG7GGAAA7A7CAAA7GC7GC77C7CAAACA7GCGAA77CA77CAAG7GACATCA 
2151 * + + * * ♦ 2220 

RDVEISNAASQ7CEFIEV7S 

230 290 
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TTCGAAATCCATGAATGTTATGATTTTCTAGAAGCTTATGGAATGCCCATGCCTGT7GGA 
2221 ♦ * + ♦ h 2280 

LEIDECTDFLEAYGMPMPVG 

300 3X0 

Tc4 

CAAAAACAAGAAGATG7GCTTAATAAAACAATCCAA 

EKEEOVLNXTIELSSGNPAT 

320 3 3o 

flncron 5 

CTTATGATGTTTTTCAAGTCTTGTCAACCGAAAACArrrCAAAAaTGAGTGGGACATACC 

LMMFFKSC EPKTFEK 

330 

AArTTGAGACTTTTAAAATAATTTATTCTACAATAAAAGTTAATCAAAAAGTTTCATACC 
2401 * -f «+ + h + 2460 

TCATTG7CTTTAAATTTTACGAATTGACGATCAAAATCAACAATTAGGATCCTCGCACGA 
24 61 + — + ♦ + * * 2520 

GACAAAACTGTG7ACCTACCGTACCCCACACATTTTCT7GATATTTGCCATCCATT7AAT 
2521 +- + + + + + 2530 

tttttaagaaaattaicgttttacataattgaacaagagatacacggtctcgacccgacg 
gaaatttttfaaatcaaagcgagtatgagcctcttttcattatttttcgattttctcttg 
ttgtttctttttatttaaack:cttttattttgaaacaagtctaaaaatattaaaaactga 
ataaaatatttaaaaaaaatcaagtaaaatagaaaaacagcaaggctggagactactgta 
cttcttaaatccgca-actctttttatttaatcattttccggaatgtcgaaacgaaataa 

2821 + + + + + + 2880 

tacatttttagtccaaaatcgctaggtatattcttaaaattatcaaacattttgcattca 

2881 -r ♦ + + + + + 2940 

C^ATGGCACAGCTTAATAACAAATTCGAAAGTCCAGGATTAGTCGGTGTTGAATGtATCA 
2941 + + + * + + 3000 

MAQLNNXLESRGLVGVECIT 
340 350 

CCCC77ACTCG7ACAAG7CAC7CGCAA7GGC7C7TCAAAGA7C7G77GAAC7T77C7CAC 
3001 + + + + ♦ ^ 3Q60 

PYSYKSLAMALQRCVEVLSD 
360 370 

ATGAGGATCGAAGTGCTCTTGCTTTCGCAGTTGTCATGCCTCCIGGAGTTGATAXACCCG 

3061 + + + + > + 31 20 

EDRS.ALAFAVVMPPGVOIPV 
380 390 
A nl3$4 

\ 

tcaagctatggtcatgtgttarrccagttgatatttgrrcaaatgaacaacaacaattcg 
xl'wscvipvdicsneeeqld 

400 410 

I Incron 6 

ATGATGAACTTGCGGATCGCTTGAAAAGACTCAGCA>CTATGAGTCTTGAAATTTGAAGA 
DEVADRLXRLSX + 



420 | 

TTCAcKcGTC 



TTTAAATTAACACrTAAAArrTCAGACGTCGACCTCTTCTCAGTGGAAAACCAATGCCCC 

RGALLSCXRMPV 
430 440 
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TXTTCACAX7CAAAAXTGAXCATATXAXCCAXAXCTTCXTGAAACACGXCCXXGAXCCAC 

3301 + * + + ♦ * 3360 

LTFKIDHIIHMFLKHVVDAQ 

450 460 

ilntron 7 I 
TATGCTGAAAATGTCTCAACTTTCAATTAAATTTTAAArrTTCAckAT 

3361 ——«—+-— ™+_™ + — - — - — — — .+ 3420 

T I A H 
GGAATCTCAATTCTCGAGCAGCGTCTTC7TGAAATAGGAAACAATAATGTATCAGTACCG 

3421 + +- +> + h + 3480 

GISI LEQRLLEI GNNNVSVP 

470 480 
GACCGACAXAXACCAXCACAXTXCCAAAAATTCCGXCCXXCAXCAGCCACXGAGATGXAX 
3481 + ♦ + + + + 3540 

ERHIPSHFQKFRRSSASEMY 

500 510 
CCAAAAACXACACAACAAACXGXCAXCCGTCCTGAACACXTCCCAAACTTCAXGCAAXTG 

3541 + + ♦ + + + 3600 

PKXTEETVIRP EDFPXFMQL 

520 530 
CACCAGAAATTCTATGACTCCCTCAAAAATTTTGCATGCTGTTAAAACCTATCGTGTACA 

3601 + + + + * + 3660 

HQXF.^DSLXNFACC* 
540 

ATATTGCCTCTATATTCCCCTCGAAATACGTTTATACTTTTTCGCACGAG7TTTCTCATT 

HI 3661 + -f + + + + 3720 

vj TTTTCATTTCTACTTGTTTTATTTCTCTCCAAAATTTCAGATCTATCCCAAATGTTCT7A 

J 3721 + + + + + + 3780 

21 AATTTAATGTTTTCTACAGATACTCAACACATCTTGTTTCATCTCATCCTTGCTT7TTTT 

Ui 3731 + + + + + + 3 g 4 Q 

TTrCAAATATATTCAGTTTCTTTTATAATTTTAATTAATCGAATTAATACATTCACGTAA 
38 41 + + + + ♦ 3900 

' AGAAXTXCCXGGACXAXXAXXXXAXCGCAXCCAAAXGATXXAXXCCCXAX7GXXCCAAAC 
^ 3901 + + + + + + 3 9S0 

U XXCCAAATXGAXCAXXXTXAAACACGCCTCAXTAAATTGAAAGXCGTACTTXXAGXCXCG 

01 3 961 + + + + + + 4020 

AACATGAACTAACTXAXTXXCTCXCTTCXAAAXTCAAAGXCCATTCCAAAAGGACAXXXC 

4021 + + —+ + + + 4080 

=4= ATGAGTTTTCACGAAAACCCTAAXTTTTACAAXTTCCTXXCACrrXTCAAGAXCXXCGAX 

CJ 4031 * - ; + + + + ♦ 4140 

p TTCXTTCCTCXGXxiGCGXCAXXACXACAXXTGCTXTCCXCCTTCACTTTAXCGACAXXC 

4141 ♦ + + + > + 4200 

I XTGCCArCAAXCGACXXCCAXCTAGACCCAXAGCACXCTXCATAXCAXXAXCCCXGXAXA 

42C1 + ♦ + + ♦ + 4260 

XXGTACXCTT7CAGXAXXTTAACXXATCGAXXACGTACXAXAXXCAGXGGXTCACXGTTX 

4 2 51 + + + «► + + 4 320 

XCGGTCAAXGGGXGACACGXGCXCGACGANNAAX.X7XCAACGAACCCAATCXCCXACTCA 

4321 ♦ — : ♦ + • + h ♦ 4380 

CTXAXCAACCAAGACCCCXCACCCATG 
4381 + ► 4407 



G 
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ced-3 Genomic Sequence 



i 



AGATCTGAAATAAGGTGATAAATTAATAAATTAAGTGTATTTCTGAGGAAATTTGACTGT 



-r ^ + + + + 6Q 

TTTAGCACAATTAATCTTGTTTCAGAAAAAAAGTCCAGTTTTCTAGATTTTTCCGTCTTA 
61 + + + + ^ + 

TTGTCGAATTAATATCCCTATTATCACTTTTXCATGCTCATCCTCGAGCGGCACGTCCTC 

+ (■ + + |> -+ 180 

AAAGAATTGTGAGAGCAAACGCGCTCCCATTGACCTCCACACTCAGCCGCCAAAACAAAC 

+ + + + + + 2 40 

GTTCGAACATTCGTGTGTTGTGCTCCTTTTCCGTTATCTTGCAGTCATCTTTTGTCGTTT 
241 + + + + + + 3Q0 

TTTTCTTTGTTCTTTTTGTTGAACGTGTTGCTAAGCAATTATTACATCAATTGAAGAAAA 
+ + + + + ^ 

GGCTCGCCGATTTATTGTTGCCAGAAAGATTCTGAGATTCTCGAAGTCGATTTTATAATA 
+ + + + + + 

TTTAACCTTGGTTTTTGCATTGTTTCGTTTAAAAAAACCACTGTTTATGTGAAAAACGAT 
421 + + + + + + 48Q 



121 
181 



301 
361 



481 
541 
601 
661 
721 
781 
841 
901 
961 
1021 
1081 
1141 



TAGTTTACTAATAAAACTACTTTTAAACCTTTACCTTTACCTCACCGCTCCGTGTTCATG 
+ + + + + (. 

GCTCATAGATTTTCGATACTCAAATCCAAAAATAAATTTACGAGGGCAATTAATGTGAAA 

CAAAAACAATCCTAAGATTTCCACATGTTTGACCTCTCCGGCACCTTCTTCCTTAGCCCC 
+ + + . + + + 

ACCACTCCATCACCTCTTTGGCGGTGTTCTTCGAAACCCACTTAGGAAAGCAGTGTGTAT 
+ + + + + + 

CTCATTTGGTATGCTCTTTTCGATTTTATAGCTCTTTGTCGCAATTTCAATGCTTTAAAC 

AATCCAAATCGCATTATATTTGTGCATGGAGGCAAATGACGGGGTTGGAATCTTAGATGA 
+ + + + + + 

GATCAGGAGCTTTCAGGGTAAACGCCCGGTTCATTTTGTACCACATTTCATCATTTTCCT 
+ - + + + + + 

GTCGTCCTTGGTATCCTCAACTTGTCCCGGTTTTGTTTTCGGTACACTCTTCCGTGATGC 

CACCTGTCTCCGTCTCAATTATCGTTTAGAAATGTGAACTGTCCAGATGGGTGACTCATA 
+ + + + + + 

TTGCTGCTGCTACAATCCACTTTCTTTTCTCATCGGCAGTCTTACGAGCCCATCATAAAC 
+ + + + + + 

TTTTTTTTCCGCGAAATTTGCAATAAACCGGCCAAAAACTTTCTCCAAATTGTTACGCAA 
TATATACAATCCATAAGAATATCTTCTCAATGTTTATGATTTCTTCGCAGCACTTTCTCT 



1261 



1321 



540 
600 
660 
720 
760 
840 
900 
960 
1020 
1080 
1140 
1200 



TCGTGTGCTAACATCTTATTTTTATAATATTTCCGCTAAAATTCCGATTTTTGAGTATTA 
1201 + + + + + + 126Q 

ATTTATCGTAAAATTATCATAATAGCACCGAAAACTACTAAAAATGGTAAAAGCTCCTTT 
+ + + + + + 

Repeat 1 

TAAATCGGCTCGACATTATCGTATTAAGGAATCACAAAATTCTGAGAATGCGTACTGCGC 
+ + + + + + 



AACATATTTGACGGCAAAATATCTCGTAGCGAAAACTACAGTAATTCTTTAAATGACTAC 
1381 + + + + + + i44Q 

Repeat 1 

> < 

TGTAGCGCTTGTGTCGATTTACGGGCTCAATTTTTGAAAATAATTTTTTTTTTCGWTTT 
1441 + + - — + + " + -~+ 1500 
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15 oi I^„!";!^ tcgt ^^ ckta ^ ctagt «"taaag^^ctctIcttc^ 

+ + + + + 1S60 



1<21 ifffi^i^ii^f^f^^iiifi^^^^"^^^^^^^;^^ 1620 

1681 !i.i.^ A f !f ™™ t^gI^c^^^cct^;;^;^;^ 1 680 

17 « ^™fi^iiiif!i^"^^=^^;^^^;c^^CT^^ 1740 

180 i H-f^ffi;*^*^^^ 1800 

1861 l^l^lll C J_ C _^ 1860 

imi -Hf^^III™:^^ 1920 

1981 Ilf^ff^f^^ff^ 1980 

2041 f^!!I!I?^™^^ 2040 

210 i *t-i.™iiir AG ^^ 2100 

+ + + 2160 



TTTCAGACTAAATCGAAAATCAAATCGTACTCTGACTA 1 



CGGGTCAGTAGAGAGGTCAACC 



2161 + - 



-+ + +- 



-+ + 2220 



2221 _______f^!*If^ff^ 

m m r + q dTTTTTITTVT-T"! 2280 

1 10 
T(nl04O) 

22 81 lll^l^^^ 

s s h 77 77777777771 "7777 2340 

20 30 
lintron 1 

2341 A I A !I^I AA !ff A f ATATGATT ^ TGTGAGT TTTTAATCGAATAATAATTTTAAAAAAA 

S D N G D ~M~ + I~~H + + + + 2400 

40 

2401 ^^^TAATATAAAGAATATTTTTGCAGTCATGTGGAACGGTTCGCGAGAAGAGACGGG 

+ r"":— + + + 2460" 

SCGTVREKRRE 
SO 

A(n718) 



2 4 61 -- -I- -l-^. f ^^^^^^AGATGTGGCGTTCGACGCGTTTTATGATGCTC 

i v K a77T7"g"T777777T771 2520 

60 70 



lintron 2 



2521 Il^flfl^fff^f 5 ^^ 

r s t g TTTTTTTTTTTTT's — + 2580 



80 90 
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# 



TTTTTAAAGTTCGGCGCAAAAGCAAGGGTCTCACGGAAAAAAGAGGCCGATCGTAATTTT 
2SQ1 + + + + ^ + 2g4o 

GCAACCCACCGGCACGGTTTTTTCCTCCGAAAATCGGAAATTATGCACTTTCCCAAATAT 
2641 + + + + + + 27Q0 

TT GAAGTGAAAT AT ATTTTATT TA CT GAAA GCTCGAGT GATT ATTTATTTTTTAAC ACTA 
2701 + + + + + + 276Q 

ATTTTCGTGGCGCAAAAGGCCATTTTGTAGATTTGCCGAAAATACTTGTCACACACACAC 

27 61 + + + + , t 

¥ + 2 820 



I 

ACACACATCTCCTTCAAATATCCCTTTTTCCAGTGTTGACTCGAATGCTGTCGAATTCGA 

2821 — —-+—.__.. . , ^ « „ « 

•r + + + + 2 880 

VDSNAVEFE 
100 

GTGTCCAATGTCACCGGCAAGCCATCGTCGGAGCCGCGCATTGAGCCCCGCCGGCTACAC 
28 81 + + + + + + 2 9 4 Q 

CPMSPASHRRSRALSPAGYT 

no 120 

TTCACCGACCCGAGTTCACCGTGACAGCGTCTCTTCAGTGTCATCATTCACTTCTTATCA 
29 41 + + + + + + 3ooq 

SPTRVHRDSVSSVSSFTSYQ 
130 140 

q ^ ATATC TACTCAAGAGCAAGATCTCGTTCTCGATCGCGTGCACTTCATTCATCGGATCG 

DIY SRARS RSRSRAL h"s""s""d"r + 3060 
150 160 

ACACAATTATTCATCTCCTCCAGTCAACGCATTTCCCAGCCAACCTTGTATGTTGATGCG * 
3061 +--: + + + 

HNYSSPPVNAFPSQPS 
170 

Repeat 1 

AACACTAAATTCTGAGAATGCGCATTACTCAACATATTTGACGCGCAAATATCTCGTAGC 
3121 - + + + + + + 3l8Q 



GAAAAATACAGTAACCCTTTAAATGACTATTGTAGTGTCGATTTACGGGCTCGATTTTCG 
3181 + + + + + + 324Q 

«--> 



AAACGAATATATGCTCGAATTGTGACAACGAATTTTAATTTGTCATTTTTGTGTTTTCTT 

+- 

Repeat 1 



3241 + + + , 

+ + -„+„.. + + 3300 



< — « 

TTGATATTTTTGATCAATTAATAAATTATTTCCGTAAACAGACACCAGCGCTACAGTACT 

3301 + — + j. . 

+ — + + + 336Q 



CTTTTAAAGAGTTACAGTAGTTTTCGCTTCAAGATATTTTGAAAAGAATTTTAAACATTT 

+ 3420 



3361 + + + + + 



TGAAAAAAAATCATCTAACATGTGCCAAAACGCTTTTTTCAAGTTTCGCAGATTTTTTGA 
3421 + + + + 



"+ + 3480 
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Repeat 2 



TTTTTTTCATTCAAGATATGCTTATTAACACATATAATTATCATTAATGTGAATTTCTTG 

+ + 3540 



3481 + + + + 



TAGAAATTTTGGGCTTTTCGTTCTAGTATGCTCTACTTTTGAAATTGCTCAACGAAAAAA 
3541 + + + + + + 3soQ 



TCATGTGGTTTGTTCATATGAATGACGAAAAATAGCAATTTTTTATATATTTTCCCCTAT 
3601 + + h + + + 36go 



TCATGTTGTGCAGAAAAATAGTAAAAAAGCGCATGCATTTTTCGACATTTTTTACATCGA 
3661 + + + + + + 3?2o 



— — ~— — — — „- 

ACGACAGCTCACTTCACATGCTGAAGACGAGAGACGCGGAGAAATACCACACATCTTTCT 
3721 -+ + „ + + + + 378Q 

Repeat 2 

<------——.— .—-„„„„„„„„„„ 



GCGTCTCTCGTCTTCAGCATGTGAAATGGGATCTCGGTCGATGTAAAAAAATGTCGAATA 
37 81 + + ^ + + + 



3840 



ATGTAAAAAATGCATGCGTTTTTTTACACTTTTCTGCACAAATGAATAGGGGGAAAATGT 
3841 + + + + + + 390Q 



ATTAAAATACATTTTTTGTATTTTTCAACATCACATGATTAACCCCATTATTTTTTCGTT 
3901 + + + + + + 396q 



GAGCAACTTAAAAAGTAGAGAATATTAGAGCGAAAACCAAAATTTCTTCAAGATATTACC 

+ + + + 4Q20 



TTTATTGATAATTATAGATGTTAATAAGCATATCTTGAATGAAAGTCAGCAAAAATATGT 

4081 TCG ^" C " GAAAA ^ TCAA ^ TTCT ^ G; ^^ 40&<r 

TTTTTG ^ T J TTTCTA ^ TCAC ATGAATGTACAAAATTAAAAGGG^^^I^^TTCTA 4 1 4 ° 

GAGGATATAATTGAATGAAACATTGCGAAATTAAAATGTGCGAAACGTCAAAAAAGAGGA 

4201 + + + + + + <2go 



^!T TG ^ TATCA ^ TC ^ TCCTA ^ CC ^"" TTTCAG ^ TCCGC CAACTCTTCAT 

+ 4320 

SANS 5 r 
180 



42 61 + + + + + 
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TCACCGGATGCTCTTCTCTCGGATACAGTTCAAGTCGTAATCGCTCATTCAGCAAAGCTT 
4321 h + + + + + 4380 

TGCSSLGYSSSRNRSFSKAS 
190 200 

CTGGACCAACTCAATACATATTCCATGAAGAGGATATGAACTTTGTCGATGCACCAACCA 

4381 ";'"": + 4 + + + + 4440 

GPTQYIFHEEDMNFVDAPTI 
210 220 

TAAGCCGTGTTTTCGACGAGAAAACCATGTACAGAAACTTCTCGAGTCCTCGTGGAATGT 
4441 + + „ + + + + 45Qo 

SRVFDEKTMYRKFSSPRG MC 
230 240 

GCCTCATCATAAATAATGAACACTTTGAGCAGATGCCAACACGGAATGGTACCAAGGCCG 
4501 ■+ + + + + + 456Q 

LI INNEHFEQMPTRNGTKAD 
250 260 

ACAAGGACAATCTTACCAATTTGTTCAGATGCATGGGCTATACGGTTATTTGCAAGGACA 
4 561 „„ + + + + + + 

KDNLTNLFRCMGYTVICKDN 
27 ° 280 

. ( intron 4 

ATCTGACGGGAAGGGTACGGCGAAATTATATTACCCAAACGCGAAATTTGCCATTTTGCG 

4621 TTVr + + + " + < 68 ° 



Repeat 3 

"•—--————————„«> 

CCGAAAATGTGGCGCCCGGTCTCGACACGACAATTTGTGTTAAATGCAAAAATGTATAAT 
4 6 81 + + + + • + + 7 

TTTGCAAAAAACAAAATTTTGAACTTCCGCGAAAATGATTTACCTAGTTTCGAAATTTTC 
4741 + + + + + + 48Qo 

4 8 01 GTTTTTTCC J^ TA ^ TTATGTGT 

ACCGTTTGTAAATTTTCAGACAATTTTCCGCATACAAAACTTGATAGCACGAAATCAATT 4 8 6 ° 
4 3 6 1 + + + + _ + + 492q 

TTCTGAATTTTCAAAATTATCCAAAAATGCACAATTTAAAATTTGTGAAAATTGGCAAAC 
4 921 +--'- + + + + + 498Q 

GGTGTTTCAATATGAAATGTATTTTTAAAAACTTTAAAAACCACTCCGGAAAAGCAATAA 
4981 + + + + + + 5o4Q 

AAATCAAAACAACGTCACAATTCAAATTCAAAAGTTATTCATCCGATTTGTTTATTTTTG 
5041 + + + + + + 5ioQ 

CAAAATTTGAAAAAATCATGAAGGATTTAGAAAAGTTTTATAACATTTTTTCTAGATTTT 
5101 + + + + + + 

TCAAAATTTTTTTTAACAAATCGAGAAAAAGAGAATGAAAAATCGATTTTAAAAATATCC 
5i 6 i + + + .„. + + + 522Q 

Repeat 3 

ACAGCTTCGAGAGTTTGAAATTACAGTACTCCTTAAAGGCGCACACCC^TTTG^TTGG 
5221 + + + + + + 52eo 



ACCAAAAATTTGTCGTGTCGAGACCAGGTACCGTAGTTTTTGTCGCAAAAATTGCA^-AT 
5281 + + + + + 534Q 

TGGACAATAAACCTTCCTAATCACCAAAAAGTAAAATTGAAATCTTCGAAAAGCCAAAAA 



5341 _ + + + + + 



-+ 5400 
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ATTCAAAAAAAAAGTCGAATTTCGATTTTTTTTTTGGTTTTTTGGTCCCAAAAACCAAAA 
540X + + + + + + 54go 

AAATCAATTTTCTGCAAAATACCAAAAAGAAACCCGAAAAAATTTCCCAGCCTTGTTCCT 
54 61 + + + h - + + 5520 

I 

AATGTAAACTGATATTTAATTTCCAGGGAATGCTCCTGACAATTCGAGACTTTGCCAAAC 
5521 4 + + + + + 5580 

GMLLTIRDFAKH 
290 3 00 

ACGAATCACACGGAGATTCTGCGATACTCGTGATTCTATCACACGGAGAAGAGAATGTGA ' 

5581 + + 4 + + 5640 

ESHGDSAILVILSHGEENVI 

310 320 

TTATTGGAGTTGATGATATACCGATTAGTACACACGAGATATATGATCTTCTCAACGCGG 
5641 + + + + + + s7oo 

IGVDDIPISTHEIYDLLNAA 

330 340 

A(n2433) 

CAAATGCTCCCCGTCTGGCGAATAAGCCGAAAATCGTTTTTGTGCAGGCTTGTCGAGGCG intr ° n 5 
5701 -—---+ + + + + + 5760 

NAP. RLANKPKIVFVQACRGE 

350 360 

GTTCGTTTTTTATTTTAATTTTAATATAAATATTTTAAATAAATTCATTTTCAGAACGTC 
5761 — + + + + „ + + 5Q2Q 

R R ] 

GTGACAATGGATTCCCAGTCTTGGATTCTGTCGACGGAGTTCCTGCATTTCTTCGTCGTG 
5821 — - + + + + + + 5880 

DNGFPVLDSVDGVPAFLRRG 
370 380 

T (nil 65) 

GATGGGACAATCGAGACGGGCCATTGTTCAATTTTCTTGGATGTGTGCGGCCGCAAGTTC 
5881 — +--- + + + + + 594Q 

WDNR DGPLFNFLGCVRPQVQ 
390 400 

I intron 6 

AGGTTGCAATTTAATTTCTTGAATGAGAATATTCCTTCAAAAAATCTAAAATAGATTTTT 
5941 + + + + + + 6ooq 

ATTCCAGAAAGTCCCGATCGAAAAATTGCGATATAATTACGAAATTTGTGATAAAATGAC 

6001 + + + + , , 

+ + 6060 

Repeat 4 

AAACCAATCAGCATCGTCGATCTCCGCCCACTTCATCGGATTGGTTTGAAAGTGGGCGGA 

6061 — + 4. j. _ , 

+ 4 + + + 612Q 

—————._> 

GTGAATTGCTGATTGGTCGCAGTTTTCAGTTTAGAGGGAATTTAAAAATCGCCTTTTCGA 
6121 + + + + + + 61gQ 

AAATTAAAAATTGATTTTTTCAATTTTTTCGAAAAATATTCCGATTATTTTATATTCTTT 
6181 + + + + + _ + 624Q 
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A(n717) 

GGAGCGAAAGCCCCGTCCTGTAAACATTTTTAAATCATAATTAATAAATTTTTGCAGCAA 
6241 + + + + + + 6300 

Q 

T<nl949) 
! 

GTGTGGAGAAAGAAGCCGAGCCAAGCTGACATTCTGATTCGATACGCAACGACAGCTCAA 
6301 + + + + + + 6360 

VWRKKPSQADILIRYATTAQ 
410 420 

A(nl286) 
I 

TATGTTTCGTGGAGAAACAGTGCTCGTGGATCATGGTTCATTCAAGCCGTCTGTGAAGTG 
6361 + + + + + + 6 420 

YVSWRNSARGSWFIQAVCEV 
430 440 

T(nll29,nll64) 
I 

TTCTCGACACACGCAAAGGATATGGATGTTGTTGAGCTGCTGACTGAAGTCAATAAGAAG 
6421 + + + + + __ + 6480 

FST HAKDM DVVELLTEVNKK 
450 460 

T<n2430) A(n2426) 
' I I intron 7 

GTCGCTTGTGGATTTCAGACATCACAGGGATCGAATATTTTGAAACAGATGCCAGAGGTA 
6481 + + + + + _ + , €540 

VACG FQ TS QG SN I LKQMP E 
470 480. 

Repeat 5 

CTTGAAACAAACAATGCATGTCTAACTI'TTAAGGACACAGAAAAATAGGCAGAGGCTCCT 
6541 + + + + + + 66Q0 



TTTGCAAGCCTGCCGCGCGTCAACCTAGAATTTTAGTTTTTAGCTAAAATGATTGATTTT 
660 i +_-' + + + ^ + g660 



GAATATTTTATGCTAATTTTTTTGCGTTAAATTTTGAAATAGTCACTATTTATCGGGTTT 
+ + + + + + 

CCAGTAAAAAATGTTTATTAGCCATTGGATTTTACTGAAAACGAAAATTTGTAGTTTTTC 



6721 ^ * + + + + 6780 

AACGAAATTTATCGATTTTTAAATGTAAAAAAAAATAGCGAAAATTACATCAACCATCAA 
6781 4 + + + + + 68 ^ 

GCATTTAAGCCAAAATTGTTAACTCATTTAAAAATTAATTCAAAGTTGTCCACGAGTATT 
6841 + + + + + + 690Q 

Repeat 5 

ACACGGTTGGCGCGCGGCAAGTTTGCAAAACGACGCTCCGCCTCTTTTTCTGTGCGGCTT 
6901 + + + + + + 696Q 



T (nll63) 



GAAAACAAGGGATCGGTTTAGATTTTTCCCCAAAATTTAAATTAAATTTCAGATGACATC 
+ + + + + + 

M T S 
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CCGCCTGCTCAAAAAGTTCTACTTTTGGCCGGAAGCACGAAACTCTGCCGTCTAAAATTC 
7021 h + h + 1 + 7080 

RLLKK FYFWPEARNSAV* 
490 500 

ACTCGTGATTCATTGCCCAATTGATAATTGTCTGTATCTTCTCCCCCAGTTCTCTTTCGC 
7081 + + + + + + 7140 

CCAATTAGTTTAAAACCATGTGTATATTGTTATCCTATACTCATTTCACTTTATCATTCT 
7141 + + + y y „+ 7200 

ATCATTTCTCTTCCCATTTTCACACATTTCCATTTCTCTACGATAATCTAAAATTATGAC 
72 01 + + + + + - + 7 260 

GTTTGTGTCTCGAACGCATAATAATTTTAATAACTCGTTTTGAATTTGATTAGTTGTTGT 
7261 + + + + + + 732Q 

GCCCAGTATATATGTATGTACTATGCTTCTATCAACAAAATAGTTTCATAGATCATCACC 
7321 + + + + + + 7380 

CCAACCCCACCAACCTACCGTACCATATTCATTTTTGCCGGGAATCAATTTCGATTAATT 
7381 + + + + + + 7440 

TTAACCTATTTTTTCGCCACAAAAAATCTAATATTTGAATTAACGAATAGCATTCCCATC 
74 41 + + + + _ + + 75Q0 

TCTCCCGTGCCGGAATGCCTCCCGGCCTTTTAAAGTTCGGAACATTTGGCAATTATGTAT 
7S01 + + + + + + 756Q 

AAATTTGTAGGTCCCCCCCATCATTTCCCGCCCATCATCTCAAATTGCATTCTTTTTTCG 
7561 + + + + (. + 762Q 

CCGTGATATCCCGATTCTGGTCAGCAAAGATCT 
7621 + + + 7653 
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